# encoding=utf-8

# sys.path.append("../main")
# https://blog.csdn.net/songzhilian22/article/details/49636725
# https://www.libinx.com/2018/text-classification-classic-ml-by-sklearn/

import pandas as pd

import src.core.PandasUtils as pandasutils

data = pd.read_csv("../../data/training.csv")
data.columns = ["type", "text"]
data["type"] = data["type"].map(lambda s: int(s) - 1)
values = data.values
df = pandasutils.convert2KeywordsDataframs(values)
